{ "cells": [ { "cell_type": "markdown", "id": "bd100442", "metadata": {}, "source": [ "# 房价预测" ] }, { "cell_type": "code", "execution_count": 1, "id": "cb4b9ea0", "metadata": { "ExecuteTime": { "end_time": "2023-10-10T10:23:54.958717Z", "start_time": "2023-10-10T10:23:53.586353Z" } }, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 2, "id": "d9805d3f", "metadata": { "ExecuteTime": { "end_time": "2023-10-10T10:24:11.692626Z", "start_time": "2023-10-10T10:24:11.557044Z" } }, "outputs": [], "source": [ "data = pd.read_csv('load_kc_house_data.csv')" ] }, { "cell_type": "code", "execution_count": 3, "id": "817bf0da", "metadata": { "ExecuteTime": { "end_time": "2023-10-10T10:24:14.333523Z", "start_time": "2023-10-10T10:24:14.247015Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", " | id | \n", "date | \n", "price | \n", "bedrooms | \n", "bathrooms | \n", "sqft_living | \n", "sqft_lot | \n", "floors | \n", "waterfront | \n", "view | \n", "... | \n", "grade | \n", "sqft_above | \n", "sqft_basement | \n", "yr_built | \n", "yr_renovated | \n", "zipcode | \n", "lat | \n", "long | \n", "sqft_living15 | \n", "sqft_lot15 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "7129300520 | \n", "20141013T000000 | \n", "221900.0 | \n", "3 | \n", "1.00 | \n", "1180 | \n", "5650 | \n", "1.0 | \n", "0 | \n", "0 | \n", "... | \n", "7 | \n", "1180 | \n", "0 | \n", "1955 | \n", "0 | \n", "98178 | \n", "47.5112 | \n", "-122.257 | \n", "1340 | \n", "5650 | \n", "
1 | \n", "6414100192 | \n", "20141209T000000 | \n", "538000.0 | \n", "3 | \n", "2.25 | \n", "2570 | \n", "7242 | \n", "2.0 | \n", "0 | \n", "0 | \n", "... | \n", "7 | \n", "2170 | \n", "400 | \n", "1951 | \n", "1991 | \n", "98125 | \n", "47.7210 | \n", "-122.319 | \n", "1690 | \n", "7639 | \n", "
2 | \n", "5631500400 | \n", "20150225T000000 | \n", "180000.0 | \n", "2 | \n", "1.00 | \n", "770 | \n", "10000 | \n", "1.0 | \n", "0 | \n", "0 | \n", "... | \n", "6 | \n", "770 | \n", "0 | \n", "1933 | \n", "0 | \n", "98028 | \n", "47.7379 | \n", "-122.233 | \n", "2720 | \n", "8062 | \n", "
3 | \n", "2487200875 | \n", "20141209T000000 | \n", "604000.0 | \n", "4 | \n", "3.00 | \n", "1960 | \n", "5000 | \n", "1.0 | \n", "0 | \n", "0 | \n", "... | \n", "7 | \n", "1050 | \n", "910 | \n", "1965 | \n", "0 | \n", "98136 | \n", "47.5208 | \n", "-122.393 | \n", "1360 | \n", "5000 | \n", "
4 | \n", "1954400510 | \n", "20150218T000000 | \n", "510000.0 | \n", "3 | \n", "2.00 | \n", "1680 | \n", "8080 | \n", "1.0 | \n", "0 | \n", "0 | \n", "... | \n", "8 | \n", "1680 | \n", "0 | \n", "1987 | \n", "0 | \n", "98074 | \n", "47.6168 | \n", "-122.045 | \n", "1800 | \n", "7503 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
21608 | \n", "263000018 | \n", "20140521T000000 | \n", "360000.0 | \n", "3 | \n", "2.50 | \n", "1530 | \n", "1131 | \n", "3.0 | \n", "0 | \n", "0 | \n", "... | \n", "8 | \n", "1530 | \n", "0 | \n", "2009 | \n", "0 | \n", "98103 | \n", "47.6993 | \n", "-122.346 | \n", "1530 | \n", "1509 | \n", "
21609 | \n", "6600060120 | \n", "20150223T000000 | \n", "400000.0 | \n", "4 | \n", "2.50 | \n", "2310 | \n", "5813 | \n", "2.0 | \n", "0 | \n", "0 | \n", "... | \n", "8 | \n", "2310 | \n", "0 | \n", "2014 | \n", "0 | \n", "98146 | \n", "47.5107 | \n", "-122.362 | \n", "1830 | \n", "7200 | \n", "
21610 | \n", "1523300141 | \n", "20140623T000000 | \n", "402101.0 | \n", "2 | \n", "0.75 | \n", "1020 | \n", "1350 | \n", "2.0 | \n", "0 | \n", "0 | \n", "... | \n", "7 | \n", "1020 | \n", "0 | \n", "2009 | \n", "0 | \n", "98144 | \n", "47.5944 | \n", "-122.299 | \n", "1020 | \n", "2007 | \n", "
21611 | \n", "291310100 | \n", "20150116T000000 | \n", "400000.0 | \n", "3 | \n", "2.50 | \n", "1600 | \n", "2388 | \n", "2.0 | \n", "0 | \n", "0 | \n", "... | \n", "8 | \n", "1600 | \n", "0 | \n", "2004 | \n", "0 | \n", "98027 | \n", "47.5345 | \n", "-122.069 | \n", "1410 | \n", "1287 | \n", "
21612 | \n", "1523300157 | \n", "20141015T000000 | \n", "325000.0 | \n", "2 | \n", "0.75 | \n", "1020 | \n", "1076 | \n", "2.0 | \n", "0 | \n", "0 | \n", "... | \n", "7 | \n", "1020 | \n", "0 | \n", "2008 | \n", "0 | \n", "98144 | \n", "47.5941 | \n", "-122.299 | \n", "1020 | \n", "1357 | \n", "
21613 rows × 21 columns
\n", "\n", " | bathrooms | \n", "view | \n", "bedrooms | \n", "condition | \n", "sqft_living | \n", "price | \n", "
---|---|---|---|---|---|---|
0 | \n", "1.00 | \n", "0 | \n", "3 | \n", "3 | \n", "1180 | \n", "221900.0 | \n", "
1 | \n", "2.25 | \n", "0 | \n", "3 | \n", "3 | \n", "2570 | \n", "538000.0 | \n", "
2 | \n", "1.00 | \n", "0 | \n", "2 | \n", "3 | \n", "770 | \n", "180000.0 | \n", "
3 | \n", "3.00 | \n", "0 | \n", "4 | \n", "5 | \n", "1960 | \n", "604000.0 | \n", "
4 | \n", "2.00 | \n", "0 | \n", "3 | \n", "3 | \n", "1680 | \n", "510000.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
21608 | \n", "2.50 | \n", "0 | \n", "3 | \n", "3 | \n", "1530 | \n", "360000.0 | \n", "
21609 | \n", "2.50 | \n", "0 | \n", "4 | \n", "3 | \n", "2310 | \n", "400000.0 | \n", "
21610 | \n", "0.75 | \n", "0 | \n", "2 | \n", "3 | \n", "1020 | \n", "402101.0 | \n", "
21611 | \n", "2.50 | \n", "0 | \n", "3 | \n", "3 | \n", "1600 | \n", "400000.0 | \n", "
21612 | \n", "0.75 | \n", "0 | \n", "2 | \n", "3 | \n", "1020 | \n", "325000.0 | \n", "
21613 rows × 6 columns
\n", "\n", " | bathrooms | \n", "view | \n", "bedrooms | \n", "condition | \n", "sqft_living | \n", "price | \n", "
---|---|---|---|---|---|---|
count | \n", "21613.000000 | \n", "21613.000000 | \n", "21613.000000 | \n", "21613.000000 | \n", "21613.000000 | \n", "2.161300e+04 | \n", "
mean | \n", "2.114757 | \n", "0.234303 | \n", "3.370842 | \n", "3.409430 | \n", "2079.899736 | \n", "5.400881e+05 | \n", "
std | \n", "0.770163 | \n", "0.766318 | \n", "0.930062 | \n", "0.650743 | \n", "918.440897 | \n", "3.671272e+05 | \n", "
min | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "1.000000 | \n", "290.000000 | \n", "7.500000e+04 | \n", "
25% | \n", "1.750000 | \n", "0.000000 | \n", "3.000000 | \n", "3.000000 | \n", "1427.000000 | \n", "3.219500e+05 | \n", "
50% | \n", "2.250000 | \n", "0.000000 | \n", "3.000000 | \n", "3.000000 | \n", "1910.000000 | \n", "4.500000e+05 | \n", "
75% | \n", "2.500000 | \n", "0.000000 | \n", "4.000000 | \n", "4.000000 | \n", "2550.000000 | \n", "6.450000e+05 | \n", "
max | \n", "8.000000 | \n", "4.000000 | \n", "33.000000 | \n", "5.000000 | \n", "13540.000000 | \n", "7.700000e+06 | \n", "
\n", " | bathrooms | \n", "view | \n", "bedrooms | \n", "condition | \n", "sqft_living | \n", "price | \n", "
---|---|---|---|---|---|---|
0 | \n", "1.00 | \n", "0 | \n", "3 | \n", "3 | \n", "1180 | \n", "221900.0 | \n", "
1 | \n", "2.25 | \n", "0 | \n", "3 | \n", "3 | \n", "2570 | \n", "538000.0 | \n", "
2 | \n", "1.00 | \n", "0 | \n", "2 | \n", "3 | \n", "770 | \n", "180000.0 | \n", "
3 | \n", "3.00 | \n", "0 | \n", "4 | \n", "5 | \n", "1960 | \n", "604000.0 | \n", "
4 | \n", "2.00 | \n", "0 | \n", "3 | \n", "3 | \n", "1680 | \n", "510000.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
21608 | \n", "2.50 | \n", "0 | \n", "3 | \n", "3 | \n", "1530 | \n", "360000.0 | \n", "
21609 | \n", "2.50 | \n", "0 | \n", "4 | \n", "3 | \n", "2310 | \n", "400000.0 | \n", "
21610 | \n", "0.75 | \n", "0 | \n", "2 | \n", "3 | \n", "1020 | \n", "402101.0 | \n", "
21611 | \n", "2.50 | \n", "0 | \n", "3 | \n", "3 | \n", "1600 | \n", "400000.0 | \n", "
21612 | \n", "0.75 | \n", "0 | \n", "2 | \n", "3 | \n", "1020 | \n", "325000.0 | \n", "
21613 rows × 6 columns
\n", "LinearRegression()In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
LinearRegression()